diff --git "a/perplexity50/3491169.out" "b/perplexity50/3491169.out" new file mode 100644--- /dev/null +++ "b/perplexity50/3491169.out" @@ -0,0 +1,40497 @@ +Model parameters: d_model 2560 ffw_size 10240 kv_size 128 n_heads 20 n_layers 34 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 2 --pipeline-model-parallel-size 1 --num-layers 34 --hidden-size 2560 --num-attention-heads 20 --kv-channels 128 --ffn-hidden-size 10240 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 2 --global-batch-size 1024 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-4b284b84bperplexity50val --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 1000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_4b284b84bperplexity50val --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-4b2-84b-c4-perplexity/perplexity50 --load lm1-4b2-84b-c4-perplexity/perplexity50 --train-weighted-split-paths-path train1b5.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --deepspeed --deepspeed_config ds_configs/3491169.json --zero-stage 0 +START 3491169: Wed 10 May 2023 12:51:16 PM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 43.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 46.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 49.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 38.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 46.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 38.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 47.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 36.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 54.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 47.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 36.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 47.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 46.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 47.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 38.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 36.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 45.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 51.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 42.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 52.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 42.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 44.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 37.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 46.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 50.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 49.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 38.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 37.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 45.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 41.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 42.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 38.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 47.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 42.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 46.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 46.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 48.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 41.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 47.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 40.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 42.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 42.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 41.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 45.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 35.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 48.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 38.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 39.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 48.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 38.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== +13: Launching on nid005464 (13/32), master nid005451 port 9999, GPUs 8, CUDA: True +31: Launching on nid005572 (31/32), master nid005451 port 9999, GPUs 8, CUDA: True +28: Launching on nid005569 (28/32), master nid005451 port 9999, GPUs 8, CUDA: True +16: Launching on nid005557 (16/32), master nid005451 port 9999, GPUs 8, CUDA: True +25: Launching on nid005566 (25/32), master nid005451 port 9999, GPUs 8, CUDA: True +30: Launching on nid005571 (30/32), master nid005451 port 9999, GPUs 8, CUDA: True +20: Launching on nid005561 (20/32), master nid005451 port 9999, GPUs 8, CUDA: True + 9: Launching on nid005460 (9/32), master nid005451 port 9999, GPUs 8, CUDA: True +14: Launching on nid005465 (14/32), master nid005451 port 9999, GPUs 8, CUDA: True +23: Launching on nid005564 (23/32), master nid005451 port 9999, GPUs 8, CUDA: True + 2: Launching on nid005453 (2/32), master nid005451 port 9999, GPUs 8, CUDA: True + 7: Launching on nid005458 (7/32), master nid005451 port 9999, GPUs 8, CUDA: True +22: Launching on nid005563 (22/32), master nid005451 port 9999, GPUs 8, CUDA: True + 4: Launching on nid005455 (4/32), master nid005451 port 9999, GPUs 8, CUDA: True +12: Launching on nid005463 (12/32), master nid005451 port 9999, GPUs 8, CUDA: True + 1: Launching on nid005452 (1/32), master nid005451 port 9999, GPUs 8, CUDA: True +26: Launching on nid005567 (26/32), master nid005451 port 9999, GPUs 8, CUDA: True +27: Launching on nid005568 (27/32), master nid005451 port 9999, GPUs 8, CUDA: True + 5: Launching on nid005456 (5/32), master nid005451 port 9999, GPUs 8, CUDA: True +24: Launching on nid005565 (24/32), master nid005451 port 9999, GPUs 8, CUDA: True + 0: Launching on nid005451 (0/32), master nid005451 port 9999, GPUs 8, CUDA: True +17: Launching on nid005558 (17/32), master nid005451 port 9999, GPUs 8, CUDA: True + 8: Launching on nid005459 (8/32), master nid005451 port 9999, GPUs 8, CUDA: True +18: Launching on nid005559 (18/32), master nid005451 port 9999, GPUs 8, CUDA: True + 6: Launching on nid005457 (6/32), master nid005451 port 9999, GPUs 8, CUDA: True +29: Launching on nid005570 (29/32), master nid005451 port 9999, GPUs 8, CUDA: True +10: Launching on nid005461 (10/32), master nid005451 port 9999, GPUs 8, CUDA: True +11: Launching on nid005462 (11/32), master nid005451 port 9999, GPUs 8, CUDA: True +15: Launching on nid005466 (15/32), master nid005451 port 9999, GPUs 8, CUDA: True +21: Launching on nid005562 (21/32), master nid005451 port 9999, GPUs 8, CUDA: True + 3: Launching on nid005454 (3/32), master nid005451 port 9999, GPUs 8, CUDA: True +19: Launching on nid005560 (19/32), master nid005451 port 9999, GPUs 8, CUDA: True + 0: using world size: 256, data-parallel-size: 128, tensor-model-parallel size: 2, pipeline-model-parallel size: 1 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 128 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3491169.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 10240 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 1024 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 2560 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-4b284b84bperplexity50val + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-4b2-84b-c4-perplexity/perplexity50 + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 2 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 20 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 34 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 2 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 1 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-4b2-84b-c4-perplexity/perplexity50 + 0: save_interval ................................... 1000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 2 + 0: tensorboard_dir ................................. tensorboard_4b284b84bperplexity50val + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 2 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 256 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 4 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 175 dummy tokens (new size: 50432) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-05-10 12:54:36,630] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl +31: > setting tensorboard ... + 0: > initializing tensor model parallel with size 2 + 0: > initializing pipeline model parallel with size 1 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.100 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 102 + 0: [1/1] c++ scaled_masked_softmax_hip.cuda.o scaled_masked_softmax_hip.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o scaled_masked_softmax_cuda.so + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: [1/1] c++ layer_norm_hip_kernel.cuda.o layer_norm_cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o fused_mix_prec_layer_norm_cuda.so + 0: >>> done with compiling and loading fused kernels. Compilation time: 23.291 seconds + 0: time to initialize megatron (seconds): -3.512 + 0: [after megatron is initialized] datetime: 2023-05-10 12:55:08 + 0: building GPT model ... + 0: [2023-05-10 12:55:08,658] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-05-10 12:55:08,659] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-05-10 12:55:08,659] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 37.53 GB, percent = 7.5% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=0, model=1): 1, ProcessCoord(pipe=0, data=1, model=0): 2, ProcessCoord(pipe=0, data=1, model=1): 3, ProcessCoord(pipe=0, data=2, model=0): 4, ProcessCoord(pipe=0, data=2, model=1): 5, ProcessCoord(pipe=0, data=3, model=0): 6, ProcessCoord(pipe=0, data=3, model=1): 7, ProcessCoord(pipe=0, data=4, model=0): 8, ProcessCoord(pipe=0, data=4, model=1): 9, ProcessCoord(pipe=0, data=5, model=0): 10, ProcessCoord(pipe=0, data=5, model=1): 11, ProcessCoord(pipe=0, data=6, model=0): 12, ProcessCoord(pipe=0, data=6, model=1): 13, ProcessCoord(pipe=0, data=7, model=0): 14, ProcessCoord(pipe=0, data=7, model=1): 15, ProcessCoord(pipe=0, data=8, model=0): 16, ProcessCoord(pipe=0, data=8, model=1): 17, ProcessCoord(pipe=0, data=9, model=0): 18, ProcessCoord(pipe=0, data=9, model=1): 19, ProcessCoord(pipe=0, data=10, model=0): 20, ProcessCoord(pipe=0, data=10, model=1): 21, ProcessCoord(pipe=0, data=11, model=0): 22, ProcessCoord(pipe=0, data + 0: =11, model=1): 23, ProcessCoord(pipe=0, data=12, model=0): 24, ProcessCoord(pipe=0, data=12, model=1): 25, ProcessCoord(pipe=0, data=13, model=0): 26, ProcessCoord(pipe=0, data=13, model=1): 27, ProcessCoord(pipe=0, data=14, model=0): 28, ProcessCoord(pipe=0, data=14, model=1): 29, ProcessCoord(pipe=0, data=15, model=0): 30, ProcessCoord(pipe=0, data=15, model=1): 31, ProcessCoord(pipe=0, data=16, model=0): 32, ProcessCoord(pipe=0, data=16, model=1): 33, ProcessCoord(pipe=0, data=17, model=0): 34, ProcessCoord(pipe=0, data=17, model=1): 35, ProcessCoord(pipe=0, data=18, model=0): 36, ProcessCoord(pipe=0, data=18, model=1): 37, ProcessCoord(pipe=0, data=19, model=0): 38, ProcessCoord(pipe=0, data=19, model=1): 39, ProcessCoord(pipe=0, data=20, model=0): 40, ProcessCoord(pipe=0, data=20, model=1): 41, ProcessCoord(pipe=0, data=21, model=0): 42, ProcessCoord(pipe=0, data=21, model=1): 43, ProcessCoord(pipe=0, data=22, model=0): 44, ProcessCoord(pipe=0, data=22, model=1): 45, ProcessCoord(pipe=0, data=23, model=0 + 0: ): 46, ProcessCoord(pipe=0, data=23, model=1): 47, ProcessCoord(pipe=0, data=24, model=0): 48, ProcessCoord(pipe=0, data=24, model=1): 49, ProcessCoord(pipe=0, data=25, model=0): 50, ProcessCoord(pipe=0, data=25, model=1): 51, ProcessCoord(pipe=0, data=26, model=0): 52, ProcessCoord(pipe=0, data=26, model=1): 53, ProcessCoord(pipe=0, data=27, model=0): 54, ProcessCoord(pipe=0, data=27, model=1): 55, ProcessCoord(pipe=0, data=28, model=0): 56, ProcessCoord(pipe=0, data=28, model=1): 57, ProcessCoord(pipe=0, data=29, model=0): 58, ProcessCoord(pipe=0, data=29, model=1): 59, ProcessCoord(pipe=0, data=30, model=0): 60, ProcessCoord(pipe=0, data=30, model=1): 61, ProcessCoord(pipe=0, data=31, model=0): 62, ProcessCoord(pipe=0, data=31, model=1): 63, ProcessCoord(pipe=0, data=32, model=0): 64, ProcessCoord(pipe=0, data=32, model=1): 65, ProcessCoord(pipe=0, data=33, model=0): 66, ProcessCoord(pipe=0, data=33, model=1): 67, ProcessCoord(pipe=0, data=34, model=0): 68, ProcessCoord(pipe=0, data=34, model=1): 69, Proce + 0: ssCoord(pipe=0, data=35, model=0): 70, ProcessCoord(pipe=0, data=35, model=1): 71, ProcessCoord(pipe=0, data=36, model=0): 72, ProcessCoord(pipe=0, data=36, model=1): 73, ProcessCoord(pipe=0, data=37, model=0): 74, ProcessCoord(pipe=0, data=37, model=1): 75, ProcessCoord(pipe=0, data=38, model=0): 76, ProcessCoord(pipe=0, data=38, model=1): 77, ProcessCoord(pipe=0, data=39, model=0): 78, ProcessCoord(pipe=0, data=39, model=1): 79, ProcessCoord(pipe=0, data=40, model=0): 80, ProcessCoord(pipe=0, data=40, model=1): 81, ProcessCoord(pipe=0, data=41, model=0): 82, ProcessCoord(pipe=0, data=41, model=1): 83, ProcessCoord(pipe=0, data=42, model=0): 84, ProcessCoord(pipe=0, data=42, model=1): 85, ProcessCoord(pipe=0, data=43, model=0): 86, ProcessCoord(pipe=0, data=43, model=1): 87, ProcessCoord(pipe=0, data=44, model=0): 88, ProcessCoord(pipe=0, data=44, model=1): 89, ProcessCoord(pipe=0, data=45, model=0): 90, ProcessCoord(pipe=0, data=45, model=1): 91, ProcessCoord(pipe=0, data=46, model=0): 92, ProcessCoord(pipe + 0: =0, data=46, model=1): 93, ProcessCoord(pipe=0, data=47, model=0): 94, ProcessCoord(pipe=0, data=47, model=1): 95, ProcessCoord(pipe=0, data=48, model=0): 96, ProcessCoord(pipe=0, data=48, model=1): 97, ProcessCoord(pipe=0, data=49, model=0): 98, ProcessCoord(pipe=0, data=49, model=1): 99, ProcessCoord(pipe=0, data=50, model=0): 100, ProcessCoord(pipe=0, data=50, model=1): 101, ProcessCoord(pipe=0, data=51, model=0): 102, ProcessCoord(pipe=0, data=51, model=1): 103, ProcessCoord(pipe=0, data=52, model=0): 104, ProcessCoord(pipe=0, data=52, model=1): 105, ProcessCoord(pipe=0, data=53, model=0): 106, ProcessCoord(pipe=0, data=53, model=1): 107, ProcessCoord(pipe=0, data=54, model=0): 108, ProcessCoord(pipe=0, data=54, model=1): 109, ProcessCoord(pipe=0, data=55, model=0): 110, ProcessCoord(pipe=0, data=55, model=1): 111, ProcessCoord(pipe=0, data=56, model=0): 112, ProcessCoord(pipe=0, data=56, model=1): 113, ProcessCoord(pipe=0, data=57, model=0): 114, ProcessCoord(pipe=0, data=57, model=1): 115, ProcessCoord( + 0: pipe=0, data=58, model=0): 116, ProcessCoord(pipe=0, data=58, model=1): 117, ProcessCoord(pipe=0, data=59, model=0): 118, ProcessCoord(pipe=0, data=59, model=1): 119, ProcessCoord(pipe=0, data=60, model=0): 120, ProcessCoord(pipe=0, data=60, model=1): 121, ProcessCoord(pipe=0, data=61, model=0): 122, ProcessCoord(pipe=0, data=61, model=1): 123, ProcessCoord(pipe=0, data=62, model=0): 124, ProcessCoord(pipe=0, data=62, model=1): 125, ProcessCoord(pipe=0, data=63, model=0): 126, ProcessCoord(pipe=0, data=63, model=1): 127, ProcessCoord(pipe=0, data=64, model=0): 128, ProcessCoord(pipe=0, data=64, model=1): 129, ProcessCoord(pipe=0, data=65, model=0): 130, ProcessCoord(pipe=0, data=65, model=1): 131, ProcessCoord(pipe=0, data=66, model=0): 132, ProcessCoord(pipe=0, data=66, model=1): 133, ProcessCoord(pipe=0, data=67, model=0): 134, ProcessCoord(pipe=0, data=67, model=1): 135, ProcessCoord(pipe=0, data=68, model=0): 136, ProcessCoord(pipe=0, data=68, model=1): 137, ProcessCoord(pipe=0, data=69, model=0): 138, Pr + 0: ocessCoord(pipe=0, data=69, model=1): 139, ProcessCoord(pipe=0, data=70, model=0): 140, ProcessCoord(pipe=0, data=70, model=1): 141, ProcessCoord(pipe=0, data=71, model=0): 142, ProcessCoord(pipe=0, data=71, model=1): 143, ProcessCoord(pipe=0, data=72, model=0): 144, ProcessCoord(pipe=0, data=72, model=1): 145, ProcessCoord(pipe=0, data=73, model=0): 146, ProcessCoord(pipe=0, data=73, model=1): 147, ProcessCoord(pipe=0, data=74, model=0): 148, ProcessCoord(pipe=0, data=74, model=1): 149, ProcessCoord(pipe=0, data=75, model=0): 150, ProcessCoord(pipe=0, data=75, model=1): 151, ProcessCoord(pipe=0, data=76, model=0): 152, ProcessCoord(pipe=0, data=76, model=1): 153, ProcessCoord(pipe=0, data=77, model=0): 154, ProcessCoord(pipe=0, data=77, model=1): 155, ProcessCoord(pipe=0, data=78, model=0): 156, ProcessCoord(pipe=0, data=78, model=1): 157, ProcessCoord(pipe=0, data=79, model=0): 158, ProcessCoord(pipe=0, data=79, model=1): 159, ProcessCoord(pipe=0, data=80, model=0): 160, ProcessCoord(pipe=0, data=80, model= + 0: 1): 161, ProcessCoord(pipe=0, data=81, model=0): 162, ProcessCoord(pipe=0, data=81, model=1): 163, ProcessCoord(pipe=0, data=82, model=0): 164, ProcessCoord(pipe=0, data=82, model=1): 165, ProcessCoord(pipe=0, data=83, model=0): 166, ProcessCoord(pipe=0, data=83, model=1): 167, ProcessCoord(pipe=0, data=84, model=0): 168, ProcessCoord(pipe=0, data=84, model=1): 169, ProcessCoord(pipe=0, data=85, model=0): 170, ProcessCoord(pipe=0, data=85, model=1): 171, ProcessCoord(pipe=0, data=86, model=0): 172, ProcessCoord(pipe=0, data=86, model=1): 173, ProcessCoord(pipe=0, data=87, model=0): 174, ProcessCoord(pipe=0, data=87, model=1): 175, ProcessCoord(pipe=0, data=88, model=0): 176, ProcessCoord(pipe=0, data=88, model=1): 177, ProcessCoord(pipe=0, data=89, model=0): 178, ProcessCoord(pipe=0, data=89, model=1): 179, ProcessCoord(pipe=0, data=90, model=0): 180, ProcessCoord(pipe=0, data=90, model=1): 181, ProcessCoord(pipe=0, data=91, model=0): 182, ProcessCoord(pipe=0, data=91, model=1): 183, ProcessCoord(pipe=0, data + 0: =92, model=0): 184, ProcessCoord(pipe=0, data=92, model=1): 185, ProcessCoord(pipe=0, data=93, model=0): 186, ProcessCoord(pipe=0, data=93, model=1): 187, ProcessCoord(pipe=0, data=94, model=0): 188, ProcessCoord(pipe=0, data=94, model=1): 189, ProcessCoord(pipe=0, data=95, model=0): 190, ProcessCoord(pipe=0, data=95, model=1): 191, ProcessCoord(pipe=0, data=96, model=0): 192, ProcessCoord(pipe=0, data=96, model=1): 193, ProcessCoord(pipe=0, data=97, model=0): 194, ProcessCoord(pipe=0, data=97, model=1): 195, ProcessCoord(pipe=0, data=98, model=0): 196, ProcessCoord(pipe=0, data=98, model=1): 197, ProcessCoord(pipe=0, data=99, model=0): 198, ProcessCoord(pipe=0, data=99, model=1): 199, ProcessCoord(pipe=0, data=100, model=0): 200, ProcessCoord(pipe=0, data=100, model=1): 201, ProcessCoord(pipe=0, data=101, model=0): 202, ProcessCoord(pipe=0, data=101, model=1): 203, ProcessCoord(pipe=0, data=102, model=0): 204, ProcessCoord(pipe=0, data=102, model=1): 205, ProcessCoord(pipe=0, data=103, model=0): 206, Process + 0: Coord(pipe=0, data=103, model=1): 207, ProcessCoord(pipe=0, data=104, model=0): 208, ProcessCoord(pipe=0, data=104, model=1): 209, ProcessCoord(pipe=0, data=105, model=0): 210, ProcessCoord(pipe=0, data=105, model=1): 211, ProcessCoord(pipe=0, data=106, model=0): 212, ProcessCoord(pipe=0, data=106, model=1): 213, ProcessCoord(pipe=0, data=107, model=0): 214, ProcessCoord(pipe=0, data=107, model=1): 215, ProcessCoord(pipe=0, data=108, model=0): 216, ProcessCoord(pipe=0, data=108, model=1): 217, ProcessCoord(pipe=0, data=109, model=0): 218, ProcessCoord(pipe=0, data=109, model=1): 219, ProcessCoord(pipe=0, data=110, model=0): 220, ProcessCoord(pipe=0, data=110, model=1): 221, ProcessCoord(pipe=0, data=111, model=0): 222, ProcessCoord(pipe=0, data=111, model=1): 223, ProcessCoord(pipe=0, data=112, model=0): 224, ProcessCoord(pipe=0, data=112, model=1): 225, ProcessCoord(pipe=0, data=113, model=0): 226, ProcessCoord(pipe=0, data=113, model=1): 227, ProcessCoord(pipe=0, data=114, model=0): 228, ProcessCoord(pipe=0 + 0: , data=114, model=1): 229, ProcessCoord(pipe=0, data=115, model=0): 230, ProcessCoord(pipe=0, data=115, model=1): 231, ProcessCoord(pipe=0, data=116, model=0): 232, ProcessCoord(pipe=0, data=116, model=1): 233, ProcessCoord(pipe=0, data=117, model=0): 234, ProcessCoord(pipe=0, data=117, model=1): 235, ProcessCoord(pipe=0, data=118, model=0): 236, ProcessCoord(pipe=0, data=118, model=1): 237, ProcessCoord(pipe=0, data=119, model=0): 238, ProcessCoord(pipe=0, data=119, model=1): 239, ProcessCoord(pipe=0, data=120, model=0): 240, ProcessCoord(pipe=0, data=120, model=1): 241, ProcessCoord(pipe=0, data=121, model=0): 242, ProcessCoord(pipe=0, data=121, model=1): 243, ProcessCoord(pipe=0, data=122, model=0): 244, ProcessCoord(pipe=0, data=122, model=1): 245, ProcessCoord(pipe=0, data=123, model=0): 246, ProcessCoord(pipe=0, data=123, model=1): 247, ProcessCoord(pipe=0, data=124, model=0): 248, ProcessCoord(pipe=0, data=124, model=1): 249, ProcessCoord(pipe=0, data=125, model=0): 250, ProcessCoord(pipe=0, data=125, + 0: model=1): 251, ProcessCoord(pipe=0, data=126, model=0): 252, ProcessCoord(pipe=0, data=126, model=1): 253, ProcessCoord(pipe=0, data=127, model=0): 254, ProcessCoord(pipe=0, data=127, model=1): 255} + 0: [2023-05-10 12:55:14,142] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=41 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: undo + 0: 38: MixedFusedLayerNorm + 0: 39: EmbeddingPipe + 0: 40: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-05-10 12:55:14,739] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-05-10 12:55:14,740] [INFO] [utils.py:828:see_memory_usage] MA 2.7 GB Max_MA 2.7 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:14,740] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 37.72 GB, percent = 7.5% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-05-10 12:55:14,743] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-05-10 12:55:20,573] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-05-10 12:55:20,573] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-05-10 12:55:20,573] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-05-10 12:55:20,593] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-05-10 12:55:20,593] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-05-10 12:55:20,729] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-05-10 12:55:20,729] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.71 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:20,729] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.38 GB, percent = 7.6% + 4: Time to load utils op: 0.30145931243896484 secondsTime to load utils op: 0.3014988899230957 seconds + 4: Time to load utils op: 0.3006296157836914 seconds + 4: Time to load utils op: 0.30058765411376953 seconds + 4: + 5: Time to load utils op: 0.3024766445159912 secondsTime to load utils op: 0.30239200592041016 seconds + 5: Time to load utils op: 0.3029210567474365 seconds + 5: + 5: Time to load utils op: 0.30289745330810547 seconds + 3: Time to load utils op: 0.3034954071044922 secondsTime to load utils op: 0.30350327491760254 seconds + 3: + 3: Time to load utils op: 0.30420446395874023 seconds + 3: Time to load utils op: 0.30286598205566406 seconds + 2: Time to load utils op: 0.3002138137817383 seconds + 2: Time to load utils op: 0.30022644996643066 secondsTime to load utils op: 0.30022692680358887 seconds + 2: + 2: Time to load utils op: 0.3002316951751709 seconds +19: Time to load utils op: 0.29546523094177246 secondsTime to load utils op: 0.2953300476074219 seconds +19: +19: Time to load utils op: 0.29543447494506836 secondsTime to load utils op: 0.2958817481994629 seconds +19: + 1: Time to load utils op: 0.302351713180542 secondsTime to load utils op: 0.30234766006469727 secondsTime to load utils op: 0.30236268043518066 seconds + 1: + 1: + 1: Time to load utils op: 0.3023815155029297 seconds + 9: Time to load utils op: 0.30022287368774414 seconds + 9: Time to load utils op: 0.30156731605529785 seconds + 9: Time to load utils op: 0.3020365238189697 seconds + 9: Time to load utils op: 0.30315518379211426 seconds + 0: Time to load utils op: 0.18796777725219727 secondsTime to load utils op: 0.30727434158325195 seconds + 0: + 0: Time to load utils op: 0.30700206756591797 seconds + 0: Time to load utils op: 0.307417631149292 seconds +11: Time to load utils op: 0.29810261726379395 secondsTime to load utils op: 0.29810333251953125 seconds +11: +11: Time to load utils op: 0.29811739921569824 seconds +11: Time to load utils op: 0.2981297969818115 seconds +14: Time to load utils op: 0.30480504035949707 secondsTime to load utils op: 0.30476903915405273 seconds +14: +14: Time to load utils op: 0.30533432960510254 seconds +14: Time to load utils op: 0.30580687522888184 seconds +20: Time to load utils op: 0.3025376796722412 seconds +20: Time to load utils op: 0.3009603023529053 seconds +20: Time to load utils op: 0.30200862884521484 seconds +20: Time to load utils op: 0.3019137382507324 seconds +25: Time to load utils op: 0.2944059371948242 seconds +31: Time to load utils op: 0.29152774810791016 seconds +31: Time to load utils op: 0.2915363311767578 secondsTime to load utils op: 0.29154539108276367 seconds +31: +25: Time to load utils op: 0.29442930221557617 seconds +25: Time to load utils op: 0.29443812370300293 seconds +25: Time to load utils op: 0.2944362163543701 seconds +31: Time to load utils op: 0.29156994819641113 seconds +24: Time to load utils op: 0.29549193382263184 seconds +24: Time to load utils op: 0.2954995632171631 seconds +24: Time to load utils op: 0.2955038547515869 secondsTime to load utils op: 0.2955174446105957 seconds +27: Time to load utils op: 0.29775547981262207 seconds +17: Time to load utils op: 0.2998337745666504 seconds +17: Time to load utils op: 0.29984498023986816 seconds +17: Time to load utils op: 0.29985475540161133 seconds +17: Time to load utils op: 0.2998692989349365 seconds +24: +27: Time to load utils op: 0.29845452308654785 secondsTime to load utils op: 0.2986781597137451 seconds +27: +28: Time to load utils op: 0.2985243797302246 secondsTime to load utils op: 0.2980082035064697 seconds +28: +28: Time to load utils op: 0.29687023162841797 seconds +28: Time to load utils op: 0.2984166145324707 seconds +27: Time to load utils op: 0.2985522747039795 seconds +29: Time to load utils op: 0.2936868667602539 seconds +29: Time to load utils op: 0.2936995029449463 seconds +29: Time to load utils op: 0.29369688034057617 seconds +29: Time to load utils op: 0.2937142848968506 seconds +30: Time to load utils op: 0.29292845726013184 seconds +30: Time to load utils op: 0.2929401397705078 seconds +30: Time to load utils op: 0.2929563522338867 secondsTime to load utils op: 0.29290127754211426 seconds +30: +13: Time to load utils op: 0.3029956817626953 secondsTime to load utils op: 0.3029961585998535 seconds +13: +13: Time to load utils op: 0.30299830436706543 seconds +13: Time to load utils op: 0.3030250072479248 seconds + 8: Time to load utils op: 0.3065776824951172 seconds + 8: Time to load utils op: 0.3065938949584961 seconds + 8: Time to load utils op: 0.30659961700439453 seconds + 8: Time to load utils op: 0.30663490295410156 seconds +18: Time to load utils op: 0.3005490303039551 secondsTime to load utils op: 0.3005561828613281 seconds +18: +18: Time to load utils op: 0.3005664348602295 seconds +18: Time to load utils op: 0.30057358741760254 seconds +10: Time to load utils op: 0.3059351444244385 secondsTime to load utils op: 0.30594468116760254 seconds +10: +10: Time to load utils op: 0.30596232414245605 seconds +10: Time to load utils op: 0.30595874786376953 seconds +15: Time to load utils op: 0.30394840240478516 secondsTime to load utils op: 0.30395078659057617 seconds +15: +15: Time to load utils op: 0.3039681911468506 seconds +15: Time to load utils op: 0.3039863109588623 seconds +12: Time to load utils op: 0.30553436279296875 seconds +12: Time to load utils op: 0.30555009841918945 seconds +12: Time to load utils op: 0.305556058883667 seconds +26: Time to load utils op: 0.30157923698425293 seconds +26: Time to load utils op: 0.301624059677124 seconds +26: Time to load utils op: 0.30135226249694824 seconds +12: Time to load utils op: 0.30556511878967285 seconds +26: Time to load utils op: 0.30205678939819336 seconds +16: Time to load utils op: 0.3031961917877197 seconds +16: Time to load utils op: 0.30321335792541504 seconds +16: Time to load utils op: 0.3032209873199463 seconds + 7: Time to load utils op: 0.3086254596710205 seconds + 7: Time to load utils op: 0.30863094329833984 secondsTime to load utils op: 0.3086264133453369 seconds + 7: +21: Time to load utils op: 0.3010554313659668 secondsTime to load utils op: 0.3010556697845459 seconds +21: +16: Time to load utils op: 0.30323171615600586 seconds + 7: Time to load utils op: 0.30869412422180176 seconds +21: Time to load utils op: 0.30109214782714844 seconds +21: Time to load utils op: 0.3011043071746826 seconds + 6: Time to load utils op: 0.308011531829834 seconds + 6: Time to load utils op: 0.3080329895019531 seconds + 6: Time to load utils op: 0.3080418109893799 seconds +23: Time to load utils op: 0.30333900451660156 secondsTime to load utils op: 0.30338549613952637 seconds +23: +23: Time to load utils op: 0.3031649589538574 seconds + 6: Time to load utils op: 0.30805158615112305 seconds +23: Time to load utils op: 0.30292797088623047 seconds +22: Time to load utils op: 0.30371952056884766 seconds +22: Time to load utils op: 0.30496811866760254 seconds +22: Time to load utils op: 0.3051128387451172 secondsTime to load utils op: 0.30493831634521484 seconds +22: + 0: [2023-05-10 12:55:21,040] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-05-10 12:55:21,041] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.69 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:21,041] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.38 GB, percent = 7.6% + 4: Time to load utils op: 0.0010786056518554688 secondsTime to load utils op: 0.001100778579711914 seconds + 4: + 4: Time to load utils op: 0.0010945796966552734 seconds + 4: Time to load utils op: 0.0011260509490966797 seconds +19: Time to load utils op: 0.0010292530059814453 secondsTime to load utils op: 0.0009734630584716797 seconds +19: Time to load utils op: 0.0010287761688232422 seconds +19: +19: Time to load utils op: 0.001081705093383789 seconds + 3: Time to load utils op: 0.001024007797241211 seconds + 3: Time to load utils op: 0.0010097026824951172 seconds + 3: Time to load utils op: 0.000957489013671875 seconds + 3: Time to load utils op: 0.001039743423461914 seconds +25: Time to load utils op: 0.0008246898651123047 seconds +25: Time to load utils op: 0.0006601810455322266 seconds +25: Time to load utils op: 0.0007340908050537109 seconds +25: Time to load utils op: 0.0007321834564208984 seconds +22: Time to load utils op: 0.0005311965942382812 seconds +22: Time to load utils op: 0.0005245208740234375 seconds +22: Time to load utils op: 0.0005466938018798828 seconds +22: Time to load utils op: 0.0005719661712646484 seconds +29: Time to load utils op: 0.0009784698486328125 secondsTime to load utils op: 0.0009737014770507812 seconds +29: +29: Time to load utils op: 0.0009844303131103516 seconds +27: Time to load utils op: 0.0007627010345458984 seconds +29: Time to load utils op: 0.000982046127319336 seconds +27: Time to load utils op: 0.0009255409240722656 secondsTime to load utils op: 0.0009558200836181641 seconds +27: +27: Time to load utils op: 0.001027822494506836 seconds +14: Time to load utils op: 0.001018524169921875 seconds +14: Time to load utils op: 0.0009980201721191406 seconds +14: Time to load utils op: 0.0010066032409667969 seconds +14: Time to load utils op: 0.0010678768157958984 seconds + 9: Time to load utils op: 0.0005142688751220703 seconds + 9: Time to load utils op: 0.0004870891571044922 seconds + 9: Time to load utils op: 0.0005326271057128906 secondsTime to load utils op: 0.0005350112915039062 seconds + 9: + 8: Time to load utils op: 0.0008647441864013672 seconds + 8: Time to load utils op: 0.0009894371032714844 secondsTime to load utils op: 0.000985860824584961 seconds + 8: + 8: Time to load utils op: 0.0010838508605957031 seconds + 0: Time to load utils op: 0.0007927417755126953 seconds + 0: Time to load utils op: 0.0007815361022949219 seconds + 0: Time to load utils op: 0.0007953643798828125 seconds + 1: Time to load utils op: 0.0008082389831542969 seconds + 1: Time to load utils op: 0.0008945465087890625 secondsTime to load utils op: 0.0008742809295654297 seconds + 1: +20: Time to load utils op: 0.0008640289306640625 secondsTime to load utils op: 0.0009043216705322266 seconds +20: +20: Time to load utils op: 0.0008900165557861328 seconds + 1: Time to load utils op: 0.0009243488311767578 seconds +20: Time to load utils op: 0.0008928775787353516 seconds +16: Time to load utils op: 0.0008678436279296875 seconds +16: Time to load utils op: 0.0008797645568847656 seconds +16: Time to load utils op: 0.0008690357208251953 seconds +16: Time to load utils op: 0.0009152889251708984 seconds +11: Time to load utils op: 0.0009477138519287109 secondsTime to load utils op: 0.00091552734375 seconds +11: +11: Time to load utils op: 0.0009238719940185547 seconds +11: Time to load utils op: 0.0009822845458984375 seconds +31: Time to load utils op: 0.0009024143218994141 seconds +31: Time to load utils op: 0.0009067058563232422 seconds +31: Time to load utils op: 0.0009336471557617188 seconds +31: Time to load utils op: 0.0009317398071289062 seconds + 7: Time to load utils op: 0.0008780956268310547 secondsTime to load utils op: 0.0008895397186279297 seconds + 7: + 7: Time to load utils op: 0.0008726119995117188 seconds + 7: Time to load utils op: 0.0009255409240722656 seconds +18: Time to load utils op: 0.0007832050323486328 seconds +18: Time to load utils op: 0.0007815361022949219 seconds +18: Time to load utils op: 0.0008835792541503906 seconds +18: Time to load utils op: 0.0009310245513916016 seconds + 2: Time to load utils op: 0.0008482933044433594 secondsTime to load utils op: 0.0008733272552490234 secondsTime to load utils op: 0.0008440017700195312 seconds + 2: + 2: + 2: Time to load utils op: 0.0008103847503662109 seconds +23: Time to load utils op: 0.0008227825164794922 seconds +23: Time to load utils op: 0.0009241104125976562 seconds +23: Time to load utils op: 0.0008943080902099609 seconds +23: Time to load utils op: 0.000989675521850586 seconds + 5: Time to load utils op: 0.0006949901580810547 seconds + 5: Time to load utils op: 0.0007505416870117188 seconds + 5: Time to load utils op: 0.0008399486541748047 seconds + 5: Time to load utils op: 0.0009169578552246094 seconds +15: Time to load utils op: 0.0007219314575195312 seconds +15: Time to load utils op: 0.0009205341339111328 seconds +15: Time to load utils op: 0.0009131431579589844 seconds +15: Time to load utils op: 0.0009415149688720703 seconds +12: Time to load utils op: 0.0010554790496826172 secondsTime to load utils op: 0.0010275840759277344 seconds +12: +12: Time to load utils op: 0.0010449886322021484 seconds +12: Time to load utils op: 0.0011088848114013672 seconds +28: Time to load utils op: 0.0009322166442871094 seconds +28: Time to load utils op: 0.0008802413940429688 secondsTime to load utils op: 0.0009300708770751953 seconds +28: +28: Time to load utils op: 0.0009796619415283203 seconds +24: Time to load utils op: 0.0007317066192626953 seconds +24: Time to load utils op: 0.0009090900421142578 seconds +24: Time to load utils op: 0.0009200572967529297 seconds +24: Time to load utils op: 0.0009918212890625 seconds +21: Time to load utils op: 0.000797271728515625 seconds +21: Time to load utils op: 0.0007917881011962891 seconds +21: Time to load utils op: 0.0008502006530761719 seconds +21: Time to load utils op: 0.0009002685546875 seconds + 6: Time to load utils op: 0.0007431507110595703 seconds + 6: Time to load utils op: 0.0007777214050292969 seconds + 6: Time to load utils op: 0.0007417201995849609 seconds +10: Time to load utils op: 0.0006470680236816406 seconds +10: Time to load utils op: 0.0005986690521240234 seconds + 6: Time to load utils op: 0.0009975433349609375 seconds +10: Time to load utils op: 0.0006983280181884766 seconds +10: Time to load utils op: 0.0007867813110351562 seconds +13: Time to load utils op: 0.0007491111755371094 seconds +13: Time to load utils op: 0.0007846355438232422 seconds +13: Time to load utils op: 0.0008141994476318359 seconds +13: Time to load utils op: 0.0008654594421386719 seconds +17: Time to load utils op: 0.0007381439208984375 seconds +30: Time to load utils op: 0.0008916854858398438 secondsTime to load utils op: 0.0008611679077148438 seconds +30: +30: Time to load utils op: 0.0008394718170166016 seconds +30: Time to load utils op: 0.0009808540344238281 seconds +17: Time to load utils op: 0.000985860824584961 secondsTime to load utils op: 0.0009174346923828125 seconds +17: +17: Time to load utils op: 0.0009899139404296875 seconds + 0: [2023-05-10 12:55:21,236] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-05-10 12:55:21,237] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:55:21,237] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.45 GB, percent = 7.6% +26: Time to load utils op: 0.0008144378662109375 seconds +26: Time to load utils op: 0.0009195804595947266 secondsTime to load utils op: 0.0008640289306640625 seconds +26: +26: Time to load utils op: 0.0008141994476318359 seconds + 0: [2023-05-10 12:55:21,362] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-05-10 12:55:21,362] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:55:21,362] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.5 GB, percent = 7.7% + 0: [2023-05-10 12:55:21,491] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-05-10 12:55:21,491] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,492] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.55 GB, percent = 7.7% + 0: [2023-05-10 12:55:21,614] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-05-10 12:55:21,615] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,615] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.61 GB, percent = 7.7% + 0: [2023-05-10 12:55:21,740] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-05-10 12:55:21,741] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,741] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.67 GB, percent = 7.7% + 0: Time to load utils op: 0.3110945224761963 seconds + 0: Time to load utils op: 0.31752800941467285 seconds + 0: Time to load utils op: 0.3236064910888672 seconds + 4: Time to load utils op: 0.3227880001068115 seconds + 3: Time to load utils op: 0.32462000846862793 seconds + 3: Time to load utils op: 0.32535362243652344 secondsTime to load utils op: 0.32504844665527344 seconds + 3: + 3: Time to load utils op: 0.3252444267272949 seconds + 0: Time to load utils op: 0.347597599029541 seconds + 4: Time to load utils op: 0.32952260971069336 seconds + 5: Time to load utils op: 0.33096981048583984 seconds + 4: Time to load utils op: 0.3341031074523926 seconds + 5: Time to load utils op: 0.33652520179748535 seconds + 4: Time to load utils op: 0.3408393859863281 seconds + 5: Time to load utils op: 0.34325075149536133 seconds + 9: Time to load utils op: 0.3433108329772949 seconds + 5: Time to load utils op: 0.3493995666503906 seconds +10: Time to load utils op: 0.285815954208374 seconds +11: Time to load utils op: 0.31934618949890137 seconds +19: Time to load utils op: 0.3439047336578369 seconds +25: Time to load utils op: 0.26685452461242676 seconds + 9: Time to load utils op: 0.3493332862854004 seconds +27: Time to load utils op: 0.343869686126709 seconds +26: Time to load utils op: 0.3441581726074219 seconds +22: Time to load utils op: 0.34677553176879883 seconds +10: Time to load utils op: 0.2920725345611572 seconds +11: Time to load utils op: 0.32492542266845703 seconds +11: Time to load utils op: 0.3255188465118408 seconds +19: Time to load utils op: 0.3492107391357422 seconds +23: Time to load utils op: 0.3479502201080322 seconds +25: Time to load utils op: 0.27025651931762695 seconds +11: Time to load utils op: 0.3259916305541992 seconds +20: Time to load utils op: 0.3507378101348877 seconds + 9: Time to load utils op: 0.35515785217285156 seconds +14: Time to load utils op: 0.35098814964294434 seconds +27: Time to load utils op: 0.34935617446899414 seconds +26: Time to load utils op: 0.34972548484802246 seconds +14: Time to load utils op: 0.3575894832611084 seconds +22: Time to load utils op: 0.35371875762939453 seconds +10: Time to load utils op: 0.3206143379211426 seconds +23: Time to load utils op: 0.353989839553833 seconds +19: Time to load utils op: 0.35590386390686035 seconds +25: Time to load utils op: 0.27910375595092773 seconds +20: Time to load utils op: 0.3567638397216797 seconds +29: Time to load utils op: 0.26780009269714355 seconds +28: Time to load utils op: 0.3523430824279785 seconds + 9: Time to load utils op: 0.36095499992370605 seconds +25: Time to load utils op: 0.2824225425720215 seconds +27: Time to load utils op: 0.3557908535003662 seconds +13: Time to load utils op: 0.3007078170776367 seconds +20: Time to load utils op: 0.3594663143157959 seconds +26: Time to load utils op: 0.35637354850769043 seconds +31: Time to load utils op: 0.29765796661376953 seconds +16: Time to load utils op: 0.28087806701660156 seconds +15: Time to load utils op: 0.32500743865966797 seconds +22: Time to load utils op: 0.35978126525878906 seconds +10: Time to load utils op: 0.30423808097839355 seconds +23: Time to load utils op: 0.3595118522644043 seconds +18: Time to load utils op: 0.31905078887939453 seconds +21: Time to load utils op: 0.3074071407318115 seconds +19: Time to load utils op: 0.3610188961029053 seconds + 2: Time to load utils op: 0.30364203453063965 seconds +29: Time to load utils op: 0.2739114761352539 seconds +20: Time to load utils op: 0.36303186416625977 seconds +28: Time to load utils op: 0.35840630531311035 seconds +14: Time to load utils op: 0.3637199401855469 seconds + 8: Time to load utils op: 0.29138803482055664 seconds +31: Time to load utils op: 0.3036985397338867 seconds +16: Time to load utils op: 0.2840230464935303 seconds +17: Time to load utils op: 0.28639984130859375 seconds +18: Time to load utils op: 0.303668737411499 seconds +27: Time to load utils op: 0.3623979091644287 seconds +30: Time to load utils op: 0.2725710868835449 seconds +13: Time to load utils op: 0.31640076637268066 seconds +26: Time to load utils op: 0.3617589473724365 seconds + 8: Time to load utils op: 0.2944302558898926 seconds + 1: Time to load utils op: 0.29564571380615234 seconds +15: Time to load utils op: 0.33097028732299805 seconds +21: Time to load utils op: 0.3135671615600586 seconds +12: Time to load utils op: 0.3099195957183838 seconds +22: Time to load utils op: 0.3660867214202881 seconds +23: Time to load utils op: 0.36640167236328125 seconds +24: Time to load utils op: 0.28728628158569336 seconds + 2: Time to load utils op: 0.3277871608734131 seconds +28: Time to load utils op: 0.3644580841064453 seconds +29: Time to load utils op: 0.28040480613708496 seconds +14: Time to load utils op: 0.3687877655029297 seconds + 7: Time to load utils op: 0.28257131576538086 seconds +16: Time to load utils op: 0.2899308204650879 seconds +31: Time to load utils op: 0.3160066604614258 seconds +15: Time to load utils op: 0.3342282772064209 seconds +21: Time to load utils op: 0.32329773902893066 seconds +17: Time to load utils op: 0.29226040840148926 seconds +18: Time to load utils op: 0.31016993522644043 seconds +30: Time to load utils op: 0.27864909172058105 seconds +13: Time to load utils op: 0.31314563751220703 seconds + 1: Time to load utils op: 0.3015425205230713 seconds + 8: Time to load utils op: 0.30087876319885254 seconds +12: Time to load utils op: 0.30635833740234375 seconds +15: Time to load utils op: 0.3372914791107178 seconds + 6: Time to load utils op: 0.2945539951324463 seconds +24: Time to load utils op: 0.2931380271911621 seconds + 2: Time to load utils op: 0.3158717155456543 seconds +29: Time to load utils op: 0.2862846851348877 seconds +28: Time to load utils op: 0.3716721534729004 seconds + 7: Time to load utils op: 0.2888498306274414 seconds +16: Time to load utils op: 0.29622936248779297 seconds +21: Time to load utils op: 0.32013964653015137 seconds + 6: Time to load utils op: 0.2974536418914795 seconds +17: Time to load utils op: 0.2987353801727295 seconds +18: Time to load utils op: 0.316281795501709 seconds +30: Time to load utils op: 0.2845630645751953 seconds +13: Time to load utils op: 0.31905245780944824 seconds +31: Time to load utils op: 0.31554746627807617 seconds + 1: Time to load utils op: 0.3079795837402344 seconds + 8: Time to load utils op: 0.3067433834075928 seconds +12: Time to load utils op: 0.3123447895050049 seconds + 6: Time to load utils op: 0.30054211616516113 seconds +24: Time to load utils op: 0.2994816303253174 seconds + 2: Time to load utils op: 0.32164549827575684 seconds + 7: Time to load utils op: 0.29494690895080566 seconds + 6: Time to load utils op: 0.3038802146911621 seconds +17: Time to load utils op: 0.30486297607421875 seconds +30: Time to load utils op: 0.29099178314208984 seconds +12: Time to load utils op: 0.31809377670288086 seconds + 1: Time to load utils op: 0.3140873908996582 seconds +24: Time to load utils op: 0.30570006370544434 seconds + 0: [2023-05-10 12:55:21,866] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 7: Time to load utils op: 0.30080127716064453 seconds + 0: [2023-05-10 12:55:21,867] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,867] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.72 GB, percent = 7.7% + 3: Time to load utils op: 0.0010120868682861328 seconds + 3: Time to load utils op: 0.0005028247833251953 seconds + 3: Time to load utils op: 0.00048089027404785156 secondsTime to load utils op: 0.0004417896270751953 seconds + 3: +26: Time to load utils op: 0.0036084651947021484 seconds +26: Time to load utils op: 0.006534576416015625 seconds +26: Time to load utils op: 0.006325483322143555 seconds +26: Time to load utils op: 0.006249189376831055 seconds + 0: [2023-05-10 12:55:22,142] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-05-10 12:55:22,142] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:22,143] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.8 GB, percent = 7.7% + 4: Time to load utils op: 0.0039920806884765625 seconds + 4: Time to load utils op: 0.00044083595275878906 seconds +11: Time to load utils op: 0.003861665725708008 seconds + 4: Time to load utils op: 0.006389617919921875 seconds + 0: Time to load utils op: 0.0039615631103515625 seconds + 0: Time to load utils op: 0.003983497619628906 seconds + 0: Time to load utils op: 0.00048279762268066406 secondsTime to load utils op: 0.000476837158203125 seconds + 0: + 4: Time to load utils op: 0.00035643577575683594 seconds + 9: Time to load utils op: 0.004007577896118164 secondsTime to load utils op: 0.0041196346282958984 seconds + 9: + 5: Time to load utils op: 0.003734588623046875 seconds + 5: Time to load utils op: 0.0036592483520507812 secondsTime to load utils op: 0.006633281707763672 seconds + 5: +11: Time to load utils op: 0.00045943260192871094 seconds +11: Time to load utils op: 0.00044035911560058594 secondsTime to load utils op: 0.0004527568817138672 seconds +11: + 5: Time to load utils op: 0.0004258155822753906 seconds + 9: Time to load utils op: 0.00034356117248535156 seconds +25: Time to load utils op: 0.003735065460205078 seconds +30: Time to load utils op: 0.003693103790283203 seconds +18: Time to load utils op: 0.00398564338684082 seconds +19: Time to load utils op: 0.00639796257019043 seconds +18: Time to load utils op: 0.0003478527069091797 seconds +15: Time to load utils op: 0.003966569900512695 seconds +21: Time to load utils op: 0.003939151763916016 seconds +21: Time to load utils op: 0.003934383392333984 seconds +25: Time to load utils op: 0.006247758865356445 seconds +20: Time to load utils op: 0.0041124820709228516 seconds +20: Time to load utils op: 0.0041081905364990234 seconds +10: Time to load utils op: 0.0035958290100097656 secondsTime to load utils op: 0.0036954879760742188 seconds +10: +30: Time to load utils op: 0.00048089027404785156 seconds +29: Time to load utils op: 0.00643157958984375 seconds +29: Time to load utils op: 0.0064389705657958984 seconds +19: Time to load utils op: 0.0004096031188964844 seconds +15: Time to load utils op: 0.003978729248046875 seconds +21: Time to load utils op: 0.006569385528564453 seconds +10: Time to load utils op: 0.0003914833068847656 seconds +20: Time to load utils op: 0.0004792213439941406 seconds +29: Time to load utils op: 0.00048041343688964844 seconds +16: Time to load utils op: 0.006602764129638672 seconds +27: Time to load utils op: 0.0037276744842529297 secondsTime to load utils op: 0.0036482810974121094 seconds +27: +27: Time to load utils op: 0.006499052047729492 seconds +19: Time to load utils op: 0.0004048347473144531 seconds +19: Time to load utils op: 0.00048828125 seconds +23: Time to load utils op: 0.006470441818237305 secondsTime to load utils op: 0.006499290466308594 seconds +23: +14: Time to load utils op: 0.006613016128540039 seconds +14: Time to load utils op: 0.0004048347473144531 seconds +14: Time to load utils op: 0.0064661502838134766 seconds + 9: Time to load utils op: 0.0004677772521972656 seconds +22: Time to load utils op: 0.006505250930786133 secondsTime to load utils op: 0.003682374954223633 secondsTime to load utils op: 0.006511211395263672 seconds +22: +22: +23: Time to load utils op: 0.0003972053527832031 seconds +30: Time to load utils op: 0.0003647804260253906 seconds +25: Time to load utils op: 0.00037670135498046875 seconds +21: Time to load utils op: 0.0005049705505371094 seconds +25: Time to load utils op: 0.00047278404235839844 seconds +29: Time to load utils op: 0.0004303455352783203 seconds +20: Time to load utils op: 0.0004875659942626953 seconds +28: Time to load utils op: 0.004117250442504883 seconds +14: Time to load utils op: 0.0004086494445800781 seconds +16: Time to load utils op: 0.0005042552947998047 secondsTime to load utils op: 0.00045800209045410156 seconds +16: +23: Time to load utils op: 0.0003972053527832031 seconds +15: Time to load utils op: 0.0003604888916015625 seconds +18: Time to load utils op: 0.0003960132598876953 seconds + 2: Time to load utils op: 0.00385284423828125 seconds + 2: Time to load utils op: 0.000392913818359375 seconds +18: Time to load utils op: 0.0004942417144775391 seconds + 1: Time to load utils op: 0.0065572261810302734 secondsTime to load utils op: 0.006537199020385742 seconds + 1: + 1: Time to load utils op: 0.006501913070678711 seconds +12: Time to load utils op: 0.006595611572265625 seconds +15: Time to load utils op: 0.00037789344787597656 seconds +27: Time to load utils op: 0.0004754066467285156 seconds +24: Time to load utils op: 0.006486177444458008 seconds +24: Time to load utils op: 0.006539821624755859 seconds +13: Time to load utils op: 0.004092216491699219 secondsTime to load utils op: 0.004119157791137695 seconds +13: + 8: Time to load utils op: 0.0039937496185302734 secondsTime to load utils op: 0.003936052322387695 seconds + 8: + 8: Time to load utils op: 0.003832578659057617 seconds +28: Time to load utils op: 0.0004942417144775391 seconds +30: Time to load utils op: 0.00048232078552246094 seconds +13: Time to load utils op: 0.006656169891357422 seconds +31: Time to load utils op: 0.006508350372314453 seconds + 8: Time to load utils op: 0.003761768341064453 seconds +17: Time to load utils op: 0.004124164581298828 secondsTime to load utils op: 0.004090785980224609 seconds +17: +17: Time to load utils op: 0.0005242824554443359 seconds +10: Time to load utils op: 0.0004000663757324219 seconds +31: Time to load utils op: 0.00047898292541503906 seconds +31: Time to load utils op: 0.0004603862762451172 secondsTime to load utils op: 0.0004570484161376953 seconds +31: +13: Time to load utils op: 0.0004019737243652344 seconds +28: Time to load utils op: 0.0005011558532714844 seconds + 6: Time to load utils op: 0.006463289260864258 seconds + 6: Time to load utils op: 0.006468057632446289 seconds +17: Time to load utils op: 0.0037488937377929688 seconds +24: Time to load utils op: 0.0005033016204833984 seconds +22: Time to load utils op: 0.00034880638122558594 seconds + 1: Time to load utils op: 0.0005488395690917969 seconds + 7: Time to load utils op: 0.004132270812988281 seconds + 7: Time to load utils op: 0.006556987762451172 seconds + 6: Time to load utils op: 0.0004146099090576172 seconds +16: Time to load utils op: 0.00046372413635253906 seconds +12: Time to load utils op: 0.0004639625549316406 seconds +28: Time to load utils op: 0.0005097389221191406 seconds + 7: Time to load utils op: 0.0004711151123046875 seconds + 7: Time to load utils op: 0.0004699230194091797 seconds + 2: Time to load utils op: 0.00047016143798828125 seconds +12: Time to load utils op: 0.0004382133483886719 seconds + 6: Time to load utils op: 0.0003986358642578125 seconds + 0: [2023-05-10 12:55:22,276] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-05-10 12:55:22,277] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:22,277] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.88 GB, percent = 7.7% + 0: [2023-05-10 12:55:22,277] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-05-10 12:55:22,277] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-05-10 12:55:22,277] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-05-10 12:55:22,277] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-05-10 12:55:22,278] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: +12: Time to load utils op: 0.00037932395935058594 seconds + 0: [2023-05-10 12:55:22,278] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-05-10 12:55:22,279] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 4 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] train_batch_size ............. 1024 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 2 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] world_size ................... 128 + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 2: Time to load utils op: 0.00048613548278808594 seconds + 0: [2023-05-10 12:55:22,280] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 2, + 0: "train_batch_size": 1.024000e+03, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.00043582916259765625 seconds + 0: [2023-05-10 12:55:22,281] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=4 micro_batch_size=2 +24: Time to load utils op: 0.0004937648773193359 seconds + 0: [2023-05-10 12:55:22,713] [INFO] [engine.py:145:__init__] RANK=1 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) + 0: [2023-05-10 12:55:22,713] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:55:25,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:55:25,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:25,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:25,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:25,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:55:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:55:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:25,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:26,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:26,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:26,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:26,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:26,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:26,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:26,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:26,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:26,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:26,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:26,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:26,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:26,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:26,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:55:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:26,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:27,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:27,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:27,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:27,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:27,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:27,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:27,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:27,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:27,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:27,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:27,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:27,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:27,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:27,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +19: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +11: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:55:27,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:27,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:27,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:27,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:27,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:27,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:27,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:27,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:27,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:55:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:27,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:55:27,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:27,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:27,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:27,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:27,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:27,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:27,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:27,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:27,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:27,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:27,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:27,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:27,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:27,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:27,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:27,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:55:27,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:55:27,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:55:27,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:55:27,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:27,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:27,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:55:27,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:27,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:55:27,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:28,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:28,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:28,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:28,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:28,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:28,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:28,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:28,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:55:28,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:28,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:28,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:55:28,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:28,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:28,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:28,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:28,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:28,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:28,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:28,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:28,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:28,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:28,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:28,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:28,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:55:28,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:28,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:28,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:28,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:28,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:28,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:28,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:28,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:28,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:28,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:55:28,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:28,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:28,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:28,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:28,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:28,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:28,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:28,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:28,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:28,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:28,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:28,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:28,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:28,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:28,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:55:28,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:55:28,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:28,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +28: [2023-05-10 12:55:28,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:55:28,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +28: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +28: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:28,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:28,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:55:28,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:28,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:28,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:28,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:28,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:55:28,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:28,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:28,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:28,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:28,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:28,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:28,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:28,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:28,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:28,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:28,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:28,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:28,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +14: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:55:28,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:28,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:28,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:29,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:29,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:29,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:29,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:29,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:29,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:29,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:29,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:29,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:29,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:29,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:29,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +13: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +13: [2023-05-10 12:55:29,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:29,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:29,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:29,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +13: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +10: [2023-05-10 12:55:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:29,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:55:29,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:29,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:29,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:29,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:29,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:29,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:29,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:29,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:29,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:55:29,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:29,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:29,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:55:29,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:29,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:29,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:55:29,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:29,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:29,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:29,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:29,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:29,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:29,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:30,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:55:30,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:30,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:30,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:30,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:30,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:30,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:30,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:55:30,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +11: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +11: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:55:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:55:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:55:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:30,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:30,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:30,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:30,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +14: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +14: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:30,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:55:30,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:55:30,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:55:30,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:30,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:55:30,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:31,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:55:31,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:55:31,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:31,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:31,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:31,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:31,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:31,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +24: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:31,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:31,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:31,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:55:31,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:55:31,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:55:31,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:55:31,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:31,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:31,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:31,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:55:31,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:31,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:31,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:31,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:31,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:31,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:32,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +25: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +20: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:32,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:32,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:55:32,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:32,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:32,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:32,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:32,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:32,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:32,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:32,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:32,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:32,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:32,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:32,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:32,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:32,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:32,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:32,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:32,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:32,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:32,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:32,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:32,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:55:32,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:32,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:32,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:32,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:32,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:32,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:32,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:55:32,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:32,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:32,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:32,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:32,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:32,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:32,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:32,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:32,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:32,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:32,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:32,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:32,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:32,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:32,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +25: [2023-05-10 12:55:32,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:32,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:32,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:32,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:32,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:32,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:32,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:32,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:32,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:55:32,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:32,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:55:32,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:32,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:32,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:32,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:32,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:32,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:32,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:32,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:32,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:32,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:32,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:32,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:32,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:55:32,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:55:32,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:32,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:32,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:32,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:32,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:32,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:32,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:55:32,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:32,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:32,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:32,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:32,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:32,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:32,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:32,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:32,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:32,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:32,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:32,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:32,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:32,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:32,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:32,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:32,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:32,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:32,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:32,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:32,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:32,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:32,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:32,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:55:32,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:32,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:55:32,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:55:32,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:33,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:33,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:33,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:33,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:33,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:33,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:33,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:33,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:33,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:33,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:33,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:33,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:33,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:33,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:33,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:33,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:33,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:33,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:33,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:33,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:33,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:33,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:33,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:33,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:33,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +26: [2023-05-10 12:55:33,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:33,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:33,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:33,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:33,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:33,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:33,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:33,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:33,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:33,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:33,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:33,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:33,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:33,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:55:33,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:33,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:33,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:33,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:33,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:33,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:33,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:33,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:33,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:33,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:33,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:33,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:33,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:33,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:55:33,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:33,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:33,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:33,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:33,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +22: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:33,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:33,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:33,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:33,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:33,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:33,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:33,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:33,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:33,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:33,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:33,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:33,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:33,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:33,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:33,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:33,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:33,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:33,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:33,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:33,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:33,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:33,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:33,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:33,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:33,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:33,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:33,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:33,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:33,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:33,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:33,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:33,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:33,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:33,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:33,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:33,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:33,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:33,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:33,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:55:33,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:33,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:33,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:33,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:33,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:33,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:33,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:33,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:33,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:33,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:33,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:33,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:33,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:33,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:33,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:33,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:33,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:33,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:33,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:33,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:33,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:33,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:33,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:33,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:33,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:33,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:33,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:33,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:33,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:33,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:33,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:33,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:33,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:33,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:33,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:33,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:33,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:33,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:33,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:33,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:33,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:55:33,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:33,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:33,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:33,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:33,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:33,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:33,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:33,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:33,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:33,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:33,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:33,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:33,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:33,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:33,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:33,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:55:33,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:33,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:33,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:33,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:33,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:33,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:33,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:33,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:33,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:33,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:33,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:33,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:33,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:33,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:33,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:33,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:33,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:33,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:33,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:33,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:33,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:55:33,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:33,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:33,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:33,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:33,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:33,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:33,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:55:33,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:33,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:33,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:33,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:33,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:33,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:33,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:33,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:33,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:33,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:33,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:33,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:33,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:33,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:33,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:33,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:55:33,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:33,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:33,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:33,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:33,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:33,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:33,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:33,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:33,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:33,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:33,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:33,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:33,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:33,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:33,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:33,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:33,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:33,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:33,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:33,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:33,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:33,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:33,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:55:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:33,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:33,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:33,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +22: [2023-05-10 12:55:33,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:55:33,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:55:33,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:55:33,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:33,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:33,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:33,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +22: [2023-05-10 12:55:33,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:33,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:33,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:33,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:33,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:33,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:33,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:33,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:33,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:33,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:33,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:55:33,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:33,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:33,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:33,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:33,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:33,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:55:33,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:33,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:33,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:33,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:33,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:33,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:33,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:33,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:33,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:33,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:33,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:33,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:33,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:33,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:33,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:33,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:33,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:33,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:33,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:33,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:33,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:33,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:33,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:33,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:33,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:33,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:33,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:33,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:33,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:33,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:33,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:33,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:33,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:33,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:33,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:33,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:33,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:33,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:33,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:33,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:33,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:33,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:33,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:33,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:33,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:33,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:33,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:33,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:33,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:33,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:33,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:33,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:55:34,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:34,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:34,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:34,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:34,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:34,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:34,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:34,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:55:34,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:34,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:55:34,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:34,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:55:34,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:34,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:34,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:34,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:34,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:34,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:55:34,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:55:34,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:55:34,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:34,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:34,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:34,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:34,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:34,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:34,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:34,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:34,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:34,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:34,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:34,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:34,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:34,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:34,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:34,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:34,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:34,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:34,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:34,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:34,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:34,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:34,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:34,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:34,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:34,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:34,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:34,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:34,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:34,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:34,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:34,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:34,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:34,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:34,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:34,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:34,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:34,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:34,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:34,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:55:34,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:34,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:34,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:34,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:34,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:34,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:34,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:34,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:34,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:34,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:34,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:34,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:34,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:34,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:34,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:34,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:55:34,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:34,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:34,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:34,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:34,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:34,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:34,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:55:34,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:34,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:34,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:34,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:34,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:34,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:34,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:34,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:34,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:34,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:34,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:55:34,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:34,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:34,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:34,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:34,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:55:34,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:34,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:34,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:34,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:34,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:34,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:34,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:34,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:34,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:34,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:34,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:34,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:34,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:34,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:34,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +25: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:34,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +25: [2023-05-10 12:55:34,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:34,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:34,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:34,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:34,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:34,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:34,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:34,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:55:34,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:34,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:34,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:34,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:34,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:34,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:34,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:34,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:34,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:34,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:34,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:34,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:34,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:34,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:34,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:34,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:34,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:34,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:34,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:34,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:34,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:34,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:34,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:34,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:34,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:55:34,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:34,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:34,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:34,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:34,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:55:34,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:34,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:34,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:34,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:34,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:34,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:34,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:34,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:34,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:34,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:34,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:34,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:34,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:34,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:34,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:34,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:34,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:34,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:34,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:34,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:34,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:34,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:34,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:34,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:34,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:35,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:35,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:35,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:35,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:35,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:35,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:35,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:35,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:35,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:35,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +26: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:35,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:35,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:35,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:35,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:35,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:35,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:35,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:35,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:55:35,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:35,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:55:35,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:55:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:35,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:35,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:55:35,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:35,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:35,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:35,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:35,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:35,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:35,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:35,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:35,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:35,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:35,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:35,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:35,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:35,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:35,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:35,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:35,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:35,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:35,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:55:35,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +20: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +20: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:55:35,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:55:35,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:55:35,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:55:35,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:55:35,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:55:35,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:35,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:55:35,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:55:35,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:55:35,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:55:35,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:55:35,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:55:35,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:55:35,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:35,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:55:35,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:35,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:35,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:35,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:55:35,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:35,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:35,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:35,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:35,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:35,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:35,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:35,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:35,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:35,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:35,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:35,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:35,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:35,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:35,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:55:35,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:35,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:35,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:35,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:35,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:35,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:35,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:35,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:35,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:35,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:35,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:35,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:35,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:35,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:35,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:35,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:35,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:35,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:35,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:35,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:35,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:35,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:35,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:35,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:35,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:55:35,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:35,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:35,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:35,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:35,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:35,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:35,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:35,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:35,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:35,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:35,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:35,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:35,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:36,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:36,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:36,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:36,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:36,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:36,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:36,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:36,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:36,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:55:36,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:36,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:36,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:36,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:36,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:36,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:36,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:36,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:36,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:36,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:36,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:36,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:36,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:36,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:36,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:36,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:36,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:36,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:36,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:36,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:36,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:36,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +27: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +27: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:36,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:36,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:36,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:55:36,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:36,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:36,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:36,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:36,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:36,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:36,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:36,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:55:36,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:36,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:36,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:36,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:36,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:36,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:36,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:36,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:36,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:36,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:36,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:36,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:36,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:36,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:55:36,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:36,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:36,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:36,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:36,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:36,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:36,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:36,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:36,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:36,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:55:36,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:36,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:36,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:36,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:36,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:36,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:55:36,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:36,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:36,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:36,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:36,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:36,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:36,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:36,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:36,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:36,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:36,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:36,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:36,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine +31: [2023-05-10 12:55:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,024] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 102 +10: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,031] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 102 +18: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:37,044] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 134 +10: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,048] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 134 + 2: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 74 +15: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:37,055] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 74 +31: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:37,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:37,097] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 132 +18: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:37,100] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 150 +27: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,102] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 132 +27: [2023-05-10 12:55:37,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,105] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 150 + 8: [2023-05-10 12:55:37,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:37,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:37,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:37,123] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 96 + 8: [2023-05-10 12:55:37,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,127] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 96 +14: [2023-05-10 12:55:37,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:37,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:37,160] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 146 +14: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,164] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 146 + 7: [2023-05-10 12:55:37,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:37,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:37,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:37,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:37,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:37,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:37,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:37,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:37,203] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 130 +22: [2023-05-10 12:55:37,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:37,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 46 +18: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:37,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 144 +16: [2023-05-10 12:55:37,207] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 130 + 7: [2023-05-10 12:55:37,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:37,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 144 + 5: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:37,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 46 + 9: [2023-05-10 12:55:37,212] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 78 +30: [2023-05-10 12:55:37,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:37,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,216] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 78 + 6: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:37,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:37,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:37,223] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 60 +24: [2023-05-10 12:55:37,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:37,226] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 98 + 7: [2023-05-10 12:55:37,227] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 60 + 5: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:37,229] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 44 + 7: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:37,230] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 62 +23: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:37,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 98 +24: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,233] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 44 +23: [2023-05-10 12:55:37,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:37,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,234] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 62 + 9: [2023-05-10 12:55:37,234] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 76 +18: [2023-05-10 12:55:37,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:37,234] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 148 +17: [2023-05-10 12:55:37,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:37,235] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 136 +24: [2023-05-10 12:55:37,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:37,237] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 58 + 9: [2023-05-10 12:55:37,238] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 76 +18: [2023-05-10 12:55:37,238] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 148 + 7: [2023-05-10 12:55:37,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:37,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 136 + 7: [2023-05-10 12:55:37,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 56 + 7: [2023-05-10 12:55:37,241] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 58 + 7: [2023-05-10 12:55:37,244] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 56 + 3: [2023-05-10 12:55:37,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:37,245] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 26 +23: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,251] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 26 + 3: [2023-05-10 12:55:37,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:37,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,254] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 28 +24: [2023-05-10 12:55:37,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,258] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 28 +23: [2023-05-10 12:55:37,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:37,267] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 142 +21: [2023-05-10 12:55:37,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:37,269] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 170 +17: [2023-05-10 12:55:37,271] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 142 +21: [2023-05-10 12:55:37,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 170 + 9: [2023-05-10 12:55:37,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:37,281] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 100 +12: [2023-05-10 12:55:37,286] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 100 + 9: [2023-05-10 12:55:37,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:37,292] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 188 +16: [2023-05-10 12:55:37,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:37,296] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 128 +23: [2023-05-10 12:55:37,296] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 188 + 9: [2023-05-10 12:55:37,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,300] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 128 + 9: [2023-05-10 12:55:37,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:37,303] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 24 +20: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,306] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 24 +20: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:37,320] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 138 +17: [2023-05-10 12:55:37,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 138 +31: [2023-05-10 12:55:37,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:37,327] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 168 +31: [2023-05-10 12:55:37,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,331] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 168 + 0: [2023-05-10 12:55:37,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:37,333] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 184 + 1: [2023-05-10 12:55:37,333] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 10 + 0: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,337] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 10 +23: [2023-05-10 12:55:37,338] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 184 + 4: [2023-05-10 12:55:37,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:37,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,342] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 30 +31: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:37,346] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 64 +25: [2023-05-10 12:55:37,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,346] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 30 +25: [2023-05-10 12:55:37,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,350] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 64 +25: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,356] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 66 +31: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,360] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 66 +25: [2023-05-10 12:55:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:37,363] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 204 + 2: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:37,367] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 204 + 2: [2023-05-10 12:55:37,368] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 18 +15: [2023-05-10 12:55:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,372] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 18 +11: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:37,372] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 92 +11: [2023-05-10 12:55:37,376] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 92 + 2: [2023-05-10 12:55:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:37,378] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 22 + 1: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:37,382] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 22 +23: [2023-05-10 12:55:37,382] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 190 +13: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,387] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 190 + 1: [2023-05-10 12:55:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:37,400] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 114 + 1: [2023-05-10 12:55:37,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:37,402] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 180 + 1: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,404] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 114 +15: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,406] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 228 + 6: [2023-05-10 12:55:37,406] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 48 +22: [2023-05-10 12:55:37,406] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 180 +13: [2023-05-10 12:55:37,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,409] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 228 +25: [2023-05-10 12:55:37,409] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 202 + 1: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,410] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 48 + 5: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:37,410] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 40 +29: [2023-05-10 12:55:37,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:37,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 12 + 1: [2023-05-10 12:55:37,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,413] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 202 +27: [2023-05-10 12:55:37,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,415] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 40 +30: [2023-05-10 12:55:37,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,415] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 242 +29: [2023-05-10 12:55:37,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,417] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 12 +23: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,418] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 186 +13: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,420] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 242 +13: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:37,422] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 186 +29: [2023-05-10 12:55:37,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,422] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 140 + 1: [2023-05-10 12:55:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:37,423] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 14 + 4: [2023-05-10 12:55:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:37,424] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 38 +29: [2023-05-10 12:55:37,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,426] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 140 +27: [2023-05-10 12:55:37,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:37,427] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 94 + 1: [2023-05-10 12:55:37,427] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 14 + 4: [2023-05-10 12:55:37,428] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 38 +27: [2023-05-10 12:55:37,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:37,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 70 +11: [2023-05-10 12:55:37,431] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 94 + 2: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,434] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 106 + 8: [2023-05-10 12:55:37,436] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 70 +13: [2023-05-10 12:55:37,438] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 106 + 2: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:37,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:37,444] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 112 +28: [2023-05-10 12:55:37,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:37,444] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 152 +28: [2023-05-10 12:55:37,444] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 224 +14: [2023-05-10 12:55:37,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:55:37,448] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 104 +13: [2023-05-10 12:55:37,448] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 110 +21: [2023-05-10 12:55:37,448] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 172 +28: [2023-05-10 12:55:37,448] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 224 +19: [2023-05-10 12:55:37,448] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 152 +14: [2023-05-10 12:55:37,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,448] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 112 +28: [2023-05-10 12:55:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,449] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 226 +13: [2023-05-10 12:55:37,452] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 104 +21: [2023-05-10 12:55:37,452] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 172 +13: [2023-05-10 12:55:37,452] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 110 +28: [2023-05-10 12:55:37,453] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 226 +27: [2023-05-10 12:55:37,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:37,455] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 200 + 2: [2023-05-10 12:55:37,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,459] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 200 +22: [2023-05-10 12:55:37,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:37,460] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 182 + 6: [2023-05-10 12:55:37,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:55:37,460] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 52 +14: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,464] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 182 + 6: [2023-05-10 12:55:37,466] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 52 +14: [2023-05-10 12:55:37,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:37,466] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 214 + 2: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:37,469] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 120 +11: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:37,469] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 88 +10: [2023-05-10 12:55:37,469] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 80 + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,470] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 214 +28: [2023-05-10 12:55:37,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,471] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 230 +15: [2023-05-10 12:55:37,473] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 120 +11: [2023-05-10 12:55:37,473] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 88 +10: [2023-05-10 12:55:37,475] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 80 +28: [2023-05-10 12:55:37,475] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 230 +14: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:37,480] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 220 +29: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:37,483] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 234 +27: [2023-05-10 12:55:37,484] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 220 +29: [2023-05-10 12:55:37,487] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 234 + 2: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:37,488] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 20 +14: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,488] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 254 +14: [2023-05-10 12:55:37,488] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 116 +25: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:37,489] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 206 +20: [2023-05-10 12:55:37,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:37,489] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 162 +30: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,491] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 240 +20: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:37,492] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 164 + 2: [2023-05-10 12:55:37,492] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 20 +31: [2023-05-10 12:55:37,492] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 254 +14: [2023-05-10 12:55:37,492] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 116 + 2: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:37,493] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 162 +25: [2023-05-10 12:55:37,493] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 206 + 2: [2023-05-10 12:55:37,494] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 16 +24: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,495] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 240 +24: [2023-05-10 12:55:37,495] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 192 +20: [2023-05-10 12:55:37,496] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 164 + 2: [2023-05-10 12:55:37,498] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 16 +24: [2023-05-10 12:55:37,499] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 192 + 1: [2023-05-10 12:55:37,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:37,499] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 8 + 5: [2023-05-10 12:55:37,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:37,501] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 42 +11: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:37,501] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 90 +13: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:55:37,502] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 108 + 6: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:37,502] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 236 + 6: [2023-05-10 12:55:37,502] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 50 +29: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:37,503] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 232 + 0: [2023-05-10 12:55:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:37,504] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 8 + 5: [2023-05-10 12:55:37,505] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 42 + 0: [2023-05-10 12:55:37,505] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 0 +11: [2023-05-10 12:55:37,505] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 90 +13: [2023-05-10 12:55:37,506] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 108 +24: [2023-05-10 12:55:37,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:37,506] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 194 +29: [2023-05-10 12:55:37,507] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 236 +29: [2023-05-10 12:55:37,508] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 232 + 6: [2023-05-10 12:55:37,509] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 50 + 0: [2023-05-10 12:55:37,509] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 0 +24: [2023-05-10 12:55:37,510] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 194 +22: [2023-05-10 12:55:37,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:37,510] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 178 + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 + 3: [2023-05-10 12:55:37,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:37,514] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 212 +29: [2023-05-10 12:55:37,514] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 238 +21: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,514] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 216 +22: [2023-05-10 12:55:37,514] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 178 +24: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:37,515] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 196 +26: [2023-05-10 12:55:37,518] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 212 +29: [2023-05-10 12:55:37,518] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 238 +27: [2023-05-10 12:55:37,519] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 216 +24: [2023-05-10 12:55:37,519] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 196 + 4: [2023-05-10 12:55:37,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:37,521] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 36 + 3: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:55:37,525] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 4 + 4: [2023-05-10 12:55:37,525] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 36 +27: [2023-05-10 12:55:37,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:37,526] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 218 + 0: [2023-05-10 12:55:37,529] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 4 +27: [2023-05-10 12:55:37,530] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 218 +22: [2023-05-10 12:55:37,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:37,531] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 176 +19: [2023-05-10 12:55:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:37,533] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 156 +19: [2023-05-10 12:55:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:37,534] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 158 +15: [2023-05-10 12:55:37,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:37,534] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 126 +22: [2023-05-10 12:55:37,535] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 176 + 3: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,536] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 244 +21: [2023-05-10 12:55:37,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,538] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 156 + 3: [2023-05-10 12:55:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,538] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 126 +19: [2023-05-10 12:55:37,538] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 158 +30: [2023-05-10 12:55:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,539] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 246 +21: [2023-05-10 12:55:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:55:37,540] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 244 +18: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:37,543] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 246 +15: [2023-05-10 12:55:37,543] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 124 + 7: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,544] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 248 + 7: [2023-05-10 12:55:37,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:37,545] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 122 + 6: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,547] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 124 +30: [2023-05-10 12:55:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,548] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 248 +30: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,550] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 122 + 3: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,552] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 252 +16: [2023-05-10 12:55:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,555] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 154 + 7: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,555] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 72 + 6: [2023-05-10 12:55:37,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,556] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 252 + 6: [2023-05-10 12:55:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,559] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 72 +18: [2023-05-10 12:55:37,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,561] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 154 +11: [2023-05-10 12:55:37,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:37,565] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 198 +20: [2023-05-10 12:55:37,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:37,567] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 166 +30: [2023-05-10 12:55:37,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,569] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 198 +17: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:55:37,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:55:37,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,571] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 166 + 5: [2023-05-10 12:55:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,574] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 54 +26: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,579] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 54 +23: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +28: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,579] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 210 + 6: [2023-05-10 12:55:37,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,582] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 82 +11: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,583] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 210 + 6: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,587] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 82 +19: [2023-05-10 12:55:37,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,589] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 86 +23: [2023-05-10 12:55:37,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:37,590] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 68 +28: [2023-05-10 12:55:37,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +17: [2023-05-10 12:55:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:37,594] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 86 + 0: [2023-05-10 12:55:37,594] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 2 +16: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,595] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 68 + 5: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,599] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 2 +17: [2023-05-10 12:55:37,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:55:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:37,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,603] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 32 +19: [2023-05-10 12:55:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:55:37,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:55:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,607] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 32 +27: [2023-05-10 12:55:37,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:37,610] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 222 +12: [2023-05-10 12:55:37,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:55:37,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:37,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,614] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 6 +27: [2023-05-10 12:55:37,614] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 222 +28: [2023-05-10 12:55:37,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:55:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:55:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,619] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 6 +10: [2023-05-10 12:55:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:37,633] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 84 + 4: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,638] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 84 +24: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:37,640] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 34 +31: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 34 +12: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:55:37,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:37,666] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 174 +15: [2023-05-10 12:55:37,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:55:37,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,670] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 160 +24: [2023-05-10 12:55:37,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,670] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 174 +29: [2023-05-10 12:55:37,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,674] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 160 + 4: [2023-05-10 12:55:37,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:37,708] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 208 +18: [2023-05-10 12:55:37,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,712] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 208 +14: [2023-05-10 12:55:37,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:37,713] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 118 +14: [2023-05-10 12:55:37,717] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 118 +14: [2023-05-10 12:55:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +18: [2023-05-10 12:55:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +18: [2023-05-10 12:55:37,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:37,736] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 250 + 7: [2023-05-10 12:55:37,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,740] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 250 + 3: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:55:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:37,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:37,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:55:37,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:37,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:37,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:37,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:38,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:38,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:55:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:55:38,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:38,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:55:38,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:38,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:38,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:38,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:38,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:38,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:38,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:38,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:55:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:55:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:55:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:55:38,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,698] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 11 + 1: [2023-05-10 12:55:38,702] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 11 + 0: [2023-05-10 12:55:38,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:38,720] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 5 +25: [2023-05-10 12:55:38,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,723] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 203 + 0: [2023-05-10 12:55:38,724] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 5 +25: [2023-05-10 12:55:38,728] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 203 +29: [2023-05-10 12:55:38,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,744] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 237 +29: [2023-05-10 12:55:38,748] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 237 +25: [2023-05-10 12:55:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,758] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 205 + 3: [2023-05-10 12:55:38,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,759] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 29 +25: [2023-05-10 12:55:38,762] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 205 + 3: [2023-05-10 12:55:38,763] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 29 + 6: [2023-05-10 12:55:38,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 233 + 6: [2023-05-10 12:55:38,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 49 +29: [2023-05-10 12:55:38,771] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 233 + 6: [2023-05-10 12:55:38,772] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 49 +29: [2023-05-10 12:55:38,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,773] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 235 +29: [2023-05-10 12:55:38,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 235 + 4: [2023-05-10 12:55:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:38,785] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 39 +18: [2023-05-10 12:55:38,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,786] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 149 + 7: [2023-05-10 12:55:38,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,788] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 57 + 4: [2023-05-10 12:55:38,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 39 +18: [2023-05-10 12:55:38,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 149 +13: [2023-05-10 12:55:38,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,793] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 111 + 7: [2023-05-10 12:55:38,793] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 57 +13: [2023-05-10 12:55:38,797] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 111 +15: [2023-05-10 12:55:38,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,798] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 125 +15: [2023-05-10 12:55:38,802] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 125 +13: [2023-05-10 12:55:38,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,803] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 109 + 4: [2023-05-10 12:55:38,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:38,806] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 35 +13: [2023-05-10 12:55:38,807] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 109 +25: [2023-05-10 12:55:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,808] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 201 +25: [2023-05-10 12:55:38,812] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 201 + 4: [2023-05-10 12:55:38,812] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 35 + 6: [2023-05-10 12:55:38,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:55:38,831] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 55 + 6: [2023-05-10 12:55:38,835] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 55 +30: [2023-05-10 12:55:38,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:38,840] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 241 +25: [2023-05-10 12:55:38,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 207 +18: [2023-05-10 12:55:38,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,842] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 151 +30: [2023-05-10 12:55:38,844] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 241 +25: [2023-05-10 12:55:38,845] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 207 +18: [2023-05-10 12:55:38,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 151 +11: [2023-05-10 12:55:38,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:38,848] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 89 + 1: [2023-05-10 12:55:38,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,851] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 9 +11: [2023-05-10 12:55:38,852] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 89 + 0: [2023-05-10 12:55:38,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:38,854] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 3 +13: [2023-05-10 12:55:38,854] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 105 +22: [2023-05-10 12:55:38,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:38,855] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 177 + 1: [2023-05-10 12:55:38,855] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 9 + 6: [2023-05-10 12:55:38,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:55:38,858] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 51 +13: [2023-05-10 12:55:38,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 105 + 0: [2023-05-10 12:55:38,859] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 3 +22: [2023-05-10 12:55:38,859] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 177 + 0: [2023-05-10 12:55:38,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,860] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 193 + 0: [2023-05-10 12:55:38,860] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 1 +24: [2023-05-10 12:55:38,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,861] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 197 + 6: [2023-05-10 12:55:38,862] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 51 +13: [2023-05-10 12:55:38,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,863] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 107 +24: [2023-05-10 12:55:38,865] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 193 + 7: [2023-05-10 12:55:38,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,865] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 191 + 7: [2023-05-10 12:55:38,865] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 59 +24: [2023-05-10 12:55:38,865] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 197 + 0: [2023-05-10 12:55:38,865] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 1 +31: [2023-05-10 12:55:38,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:38,866] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 251 +13: [2023-05-10 12:55:38,867] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 107 + 0: [2023-05-10 12:55:38,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:38,869] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 7 +14: [2023-05-10 12:55:38,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 191 +14: [2023-05-10 12:55:38,869] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 113 + 7: [2023-05-10 12:55:38,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 59 + 2: [2023-05-10 12:55:38,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:38,870] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 21 +31: [2023-05-10 12:55:38,870] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 251 + 7: [2023-05-10 12:55:38,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,872] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 63 +29: [2023-05-10 12:55:38,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,873] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 239 +14: [2023-05-10 12:55:38,873] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 113 + 0: [2023-05-10 12:55:38,873] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 7 + 2: [2023-05-10 12:55:38,874] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 21 + 7: [2023-05-10 12:55:38,876] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 63 +29: [2023-05-10 12:55:38,877] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 239 +24: [2023-05-10 12:55:38,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 195 + 5: [2023-05-10 12:55:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:38,882] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 41 +24: [2023-05-10 12:55:38,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 195 +30: [2023-05-10 12:55:38,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:38,886] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 247 + 5: [2023-05-10 12:55:38,887] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 41 +30: [2023-05-10 12:55:38,890] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 247 + 7: [2023-05-10 12:55:38,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,891] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 61 + 7: [2023-05-10 12:55:38,896] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 61 + 1: [2023-05-10 12:55:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,902] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 15 + 9: [2023-05-10 12:55:38,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:38,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:38,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 73 +15: [2023-05-10 12:55:38,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:38,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 85 +15: [2023-05-10 12:55:38,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 121 + 1: [2023-05-10 12:55:38,906] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 15 + 5: [2023-05-10 12:55:38,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,908] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 121 + 5: [2023-05-10 12:55:38,908] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 43 + 9: [2023-05-10 12:55:38,909] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 73 +14: [2023-05-10 12:55:38,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 119 +27: [2023-05-10 12:55:38,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 221 +23: [2023-05-10 12:55:38,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 187 + 2: [2023-05-10 12:55:38,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:38,910] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 17 +10: [2023-05-10 12:55:38,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:38,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 87 +10: [2023-05-10 12:55:38,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 85 + 5: [2023-05-10 12:55:38,913] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 43 +23: [2023-05-10 12:55:38,913] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 187 +14: [2023-05-10 12:55:38,914] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 119 + 2: [2023-05-10 12:55:38,914] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 17 + 6: [2023-05-10 12:55:38,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,914] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 221 + 6: [2023-05-10 12:55:38,914] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 53 +10: [2023-05-10 12:55:38,915] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 87 + 6: [2023-05-10 12:55:38,919] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 53 +31: [2023-05-10 12:55:38,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:38,919] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 253 +16: [2023-05-10 12:55:38,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:38,921] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 135 +30: [2023-05-10 12:55:38,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:38,923] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 243 +31: [2023-05-10 12:55:38,923] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 253 +16: [2023-05-10 12:55:38,925] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 135 +23: [2023-05-10 12:55:38,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,927] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 189 +30: [2023-05-10 12:55:38,927] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 243 +15: [2023-05-10 12:55:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,928] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 127 +15: [2023-05-10 12:55:38,928] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 123 +16: [2023-05-10 12:55:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:38,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 129 +11: [2023-05-10 12:55:38,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:38,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 91 +23: [2023-05-10 12:55:38,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 189 + 2: [2023-05-10 12:55:38,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 127 +15: [2023-05-10 12:55:38,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 123 + 2: [2023-05-10 12:55:38,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 23 + 8: [2023-05-10 12:55:38,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:38,933] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 67 +16: [2023-05-10 12:55:38,933] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 129 +17: [2023-05-10 12:55:38,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,935] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 141 +23: [2023-05-10 12:55:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,935] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 185 +11: [2023-05-10 12:55:38,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 91 +24: [2023-05-10 12:55:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:38,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 23 +24: [2023-05-10 12:55:38,937] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 199 +20: [2023-05-10 12:55:38,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,937] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 161 + 8: [2023-05-10 12:55:38,938] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 67 +17: [2023-05-10 12:55:38,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 141 +23: [2023-05-10 12:55:38,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 185 +24: [2023-05-10 12:55:38,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 199 +20: [2023-05-10 12:55:38,942] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 161 + 3: [2023-05-10 12:55:38,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,943] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 27 + 3: [2023-05-10 12:55:38,948] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 27 +14: [2023-05-10 12:55:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,949] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 117 + 1: [2023-05-10 12:55:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,951] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 13 +14: [2023-05-10 12:55:38,953] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 117 + 4: [2023-05-10 12:55:38,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:38,953] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 37 + 1: [2023-05-10 12:55:38,955] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 13 +18: [2023-05-10 12:55:38,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,957] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 145 + 4: [2023-05-10 12:55:38,958] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 37 + 3: [2023-05-10 12:55:38,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 25 +18: [2023-05-10 12:55:38,961] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 145 + 3: [2023-05-10 12:55:38,963] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 25 + 9: [2023-05-10 12:55:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:38,966] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 75 +22: [2023-05-10 12:55:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:38,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 183 +21: [2023-05-10 12:55:38,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:38,970] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 175 + 9: [2023-05-10 12:55:38,970] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 75 +22: [2023-05-10 12:55:38,971] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 183 +21: [2023-05-10 12:55:38,974] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 175 +16: [2023-05-10 12:55:38,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:38,975] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 131 +17: [2023-05-10 12:55:38,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,977] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 139 +17: [2023-05-10 12:55:38,981] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 139 +16: [2023-05-10 12:55:38,981] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 131 +19: [2023-05-10 12:55:38,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,982] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 157 +20: [2023-05-10 12:55:38,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,983] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 163 +19: [2023-05-10 12:55:38,986] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 157 +20: [2023-05-10 12:55:38,987] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 163 +14: [2023-05-10 12:55:38,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,988] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 115 +19: [2023-05-10 12:55:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,989] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 155 +14: [2023-05-10 12:55:38,992] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 115 +19: [2023-05-10 12:55:38,993] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 155 +11: [2023-05-10 12:55:38,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:38,994] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 95 +17: [2023-05-10 12:55:38,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,995] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 137 +12: [2023-05-10 12:55:38,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:38,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:38,997] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 99 +11: [2023-05-10 12:55:38,997] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 93 +11: [2023-05-10 12:55:38,999] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 95 +17: [2023-05-10 12:55:38,999] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 137 +11: [2023-05-10 12:55:39,001] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 93 +12: [2023-05-10 12:55:39,001] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 99 + 8: [2023-05-10 12:55:39,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:39,002] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 65 +12: [2023-05-10 12:55:39,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:39,002] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 97 +28: [2023-05-10 12:55:39,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:39,003] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 229 +18: [2023-05-10 12:55:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:39,005] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 147 +31: [2023-05-10 12:55:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,006] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 249 + 8: [2023-05-10 12:55:39,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 65 +12: [2023-05-10 12:55:39,007] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 97 +28: [2023-05-10 12:55:39,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 229 +30: [2023-05-10 12:55:39,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:39,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 245 +31: [2023-05-10 12:55:39,010] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 249 +18: [2023-05-10 12:55:39,010] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 147 + 8: [2023-05-10 12:55:39,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:39,011] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 71 +26: [2023-05-10 12:55:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:39,013] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 215 +30: [2023-05-10 12:55:39,013] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 245 + 8: [2023-05-10 12:55:39,015] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 71 +17: [2023-05-10 12:55:39,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:39,016] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 143 +20: [2023-05-10 12:55:39,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:39,018] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 165 +26: [2023-05-10 12:55:39,019] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 215 +17: [2023-05-10 12:55:39,020] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 143 +28: [2023-05-10 12:55:39,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:39,020] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 227 +20: [2023-05-10 12:55:39,022] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 165 +19: [2023-05-10 12:55:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:39,023] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 159 + 5: [2023-05-10 12:55:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:39,023] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 45 +28: [2023-05-10 12:55:39,024] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 227 +19: [2023-05-10 12:55:39,027] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 159 + 5: [2023-05-10 12:55:39,028] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 45 +21: [2023-05-10 12:55:39,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:39,030] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 169 + 3: [2023-05-10 12:55:39,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:39,032] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 31 +28: [2023-05-10 12:55:39,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:39,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 231 +21: [2023-05-10 12:55:39,034] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 169 + 3: [2023-05-10 12:55:39,036] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 31 +28: [2023-05-10 12:55:39,038] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 231 +31: [2023-05-10 12:55:39,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,039] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 255 +26: [2023-05-10 12:55:39,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:39,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:39,040] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 33 +26: [2023-05-10 12:55:39,040] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 211 + 8: [2023-05-10 12:55:39,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:39,043] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 69 +26: [2023-05-10 12:55:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,043] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 255 + 4: [2023-05-10 12:55:39,043] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 33 +26: [2023-05-10 12:55:39,043] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 213 + 8: [2023-05-10 12:55:39,047] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 69 +12: [2023-05-10 12:55:39,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:39,052] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 101 +22: [2023-05-10 12:55:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:39,054] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 179 +26: [2023-05-10 12:55:39,054] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 211 +27: [2023-05-10 12:55:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:39,055] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 217 + 2: [2023-05-10 12:55:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:39,057] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 101 + 2: [2023-05-10 12:55:39,057] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 19 +26: [2023-05-10 12:55:39,057] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 213 +22: [2023-05-10 12:55:39,059] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 179 +16: [2023-05-10 12:55:39,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:39,060] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 133 +22: [2023-05-10 12:55:39,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:39,060] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 181 +27: [2023-05-10 12:55:39,060] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 217 +20: [2023-05-10 12:55:39,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:39,061] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 167 + 2: [2023-05-10 12:55:39,062] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 19 +16: [2023-05-10 12:55:39,064] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 133 +22: [2023-05-10 12:55:39,064] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 181 +20: [2023-05-10 12:55:39,065] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 167 + 9: [2023-05-10 12:55:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:39,075] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 77 +12: [2023-05-10 12:55:39,075] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 103 + 9: [2023-05-10 12:55:39,079] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 77 +12: [2023-05-10 12:55:39,081] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 103 +19: [2023-05-10 12:55:39,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:39,086] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 153 + 9: [2023-05-10 12:55:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:39,088] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 79 +10: [2023-05-10 12:55:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:39,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 83 +27: [2023-05-10 12:55:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:39,091] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 223 + 9: [2023-05-10 12:55:39,092] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 79 +19: [2023-05-10 12:55:39,092] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 153 +10: [2023-05-10 12:55:39,093] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 83 +28: [2023-05-10 12:55:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:39,094] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 225 +27: [2023-05-10 12:55:39,095] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 223 +28: [2023-05-10 12:55:39,099] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 225 + 5: [2023-05-10 12:55:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:39,107] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 47 +10: [2023-05-10 12:55:39,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:39,108] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 81 +27: [2023-05-10 12:55:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:39,110] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 219 + 5: [2023-05-10 12:55:39,112] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 47 +10: [2023-05-10 12:55:39,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 81 +27: [2023-05-10 12:55:39,114] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 219 +21: [2023-05-10 12:55:39,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:39,132] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 171 +21: [2023-05-10 12:55:39,135] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 171 +26: [2023-05-10 12:55:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:39,170] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 209 +26: [2023-05-10 12:55:39,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 209 +21: [2023-05-10 12:55:39,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:39,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 173 +21: [2023-05-10 12:55:39,232] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 173 + 0: successfully loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity50 at iteration 0 +31: time (ms) | load-checkpoint: 13905.34 + 0: estimated model parameters: 2.81512448 + 0: estimated model parameters without embeddings: 2.6755328 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-05-10 12:55:40 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 102400 + 0: test: 102400 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.059151 seconds + 0: number of documents: 3133972 + 0: > dataset split: + 0: train: + 0: document indices in [0, 3133972) total of 3133972 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.030 seconds + 0: total number of samples: 731002 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.006884 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.013 seconds + 0: total number of samples: 169955 + 0: total number of epochs: 2 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-05-10 12:55:48 + 0: done with setup ... + 0: training ... +31: time (ms) | model-and-optimizer-setup: 31570.86 | train/valid/test-data-iterators-setup: 4658.28 + 0: [after training is done] datetime: 2023-05-10 12:55:48 +31: ----------------------------------------------------------------------------------------------------------------- +31: validation loss at the end of training for val data | lm loss value: 2.636081E+00 | lm loss PPL: 1.395840E+01 | +31: ----------------------------------------------------------------------------------------------------------------- +END 3491169: Wed 10 May 2023 12:57:30 PM EEST